<- read_csv('https://bcdanl.github.io/data/custdata_rev.csv') health_cust
Let’s analyze the homework 4
data:
Housing Type Statistics
<- health_cust |>
housing_type_statistics group_by(housing_type) |>
summarize(
mean = mean(income, na.rm = TRUE),
SD = sd(income, na.rm = TRUE),
Q1 = quantile(income, probs = 0.25, na.rm = TRUE),
Median = median(income, na.rm = TRUE),
Q3 = quantile(income, probs = 0.75, na.rm = TRUE),
Max = max(income, na.rm = TRUE)
)
State of Residency Statistics
<- health_cust |>
state_statistics group_by(state_of_res) |>
summarize(
mean = mean(income, na.rm = TRUE),
SD = sd(income, na.rm = TRUE),
Q1 = quantile(income, probs = 0.25, na.rm = TRUE),
Median = median(income, na.rm = TRUE),
Q3 = quantile(income, probs = 0.75, na.rm = TRUE),
Max = max(income, na.rm = TRUE)
)
Marital Status Statistics
<- health_cust |>
marital_statistics group_by(marital_status) |>
summarize(
mean = mean(income, na.rm = TRUE),
SD = sd(income, na.rm = TRUE),
Q1 = quantile(income, probs = 0.25, na.rm = TRUE),
Median = median(income, na.rm = TRUE),
Q3 = quantile(income, probs = 0.75, na.rm = TRUE),
Max = max(income, na.rm = TRUE)
)
Income by Housing Type
<- health_cust |>
income_by_housing_type group_by(income, housing_type) |>
summarize(Count = n(), .groups = "drop") |>
group_by(housing_type) |>
arrange(desc(income))